setwd("../")
rm(list = ls())

# # only need to install once
# devtools::install_github("cloudyr/pyMTurkR", dependencies=TRUE)
# devtools::install_github("Luwei-Ying/validateIt", dependencies=TRUE)
# load R package
library(validateIt)

### load topic model
load('models/stm50k.Rdata')
# the two files below are omitted from this replication package for copyright reasons
# refer to the 0_preparation/fittopicmodel.R file to see how they are generated
load('models/stmPrep.Rdata')
load('models/heldout.Rdata')

### prepare tasks
newMass <- combMass(stm50k)
T8WSIstm50k <- validateTopic(type = "T8WSI", n = 500, text = stmPrep$meta$post_text[-heldout$missing$index],
                             vocab = newMass[[1]], beta = newMass[[2]], theta = stm50k$theta[-heldout$missing$index,], thres = 20)
goldT8WSI <- read.csv("goldstandard/goldT8WSI.csv", stringsAsFactors = FALSE)
T8WSIstm50k <- mixGold(tasks = T8WSIstm50k, golds = goldT8WSI)
T8WSIstm50k <- recordTasks(type = "T8WSI", tasks = T8WSIstm50k, path = "topicrecords/T8WSIstm50k.Rdata")

# ##### interact with Mturk from here #####
# ### environment
# library(pyMTurkR)
# Sys.setenv(AWS_ACCESS_KEY_ID = "AWS_ACCESS_KEY_ID")
# Sys.setenv(AWS_SECRET_ACCESS_KEY = "AWS_SECRET_ACCESS_KEY")
# options(pyMTurkR.sandbox = T) # Change sandbox = F when ready to run on MTurk
# AccountBalance()
# 
# ### send tasks (first trial)
# T8WSIstm50kids <- sendTasks(hit_type = 'find_from_dashboard', hit_layout = 'find_from_dashboard', type = "T8WSI",
#                             tasksrecord = T8WSIstm50k, HITidspath = "HITids/T8WSIstm50kids1.Rdata")
# ### extend HITs if needed
# for(i in T8WSIstm50kids[[1]]){
#   ExtendHIT(hit = i, add.seconds = 60*60*48)
# }
# 
# load("HITids/T8WSIstm50kids1.Rdata")
# T8WSIstm50kresults1 <- getResults(batch_id = "T8WSIstm50k1", hit_ids = HITids, retry = FALSE)
# write.csv(T8WSIstm50kresults1, "../../1_replication/1_topicvalidation/topicresults/T8WSIstm50kresults1.csv", row.names = FALSE)
# evalResults(results = T8WSIstm50kresults1, key = T8WSIstm50k, type = "T8WSI")
# 
# ### send tasks (second trial)
# T8WSIstm50kids <- sendTasks(hit_type = 'find_from_dashboard', hit_layout = 'find_from_dashboard', type = "T8WSI",
#                             tasksrecord = T8WSIstm50k, HITidspath = "HITids/T8WSIstm50kids2.Rdata")
# ### extend HITs if needed
# for(i in T8WSIstm50kids[[1]]){
#   ExtendHIT(hit = i, add.seconds = 60*60*48)
# }
# 
# load("HITids/T8WSIstm50kids2.Rdata")
# T8WSIstm50kresults2 <- getResults(batch_id = "T8WSIstm50k2", hit_ids = HITids, retry = FALSE)
# write.csv(T8WSIstm50kresults2, "../../1_replication/1_topicvalidation/topicresults/T8WSIstm50kresults2.csv", row.names = FALSE)
# evalResults(results = T8WSIstm50kresults2, key = T8WSIstm50k, type = "T8WSI")